# coding=utf-8
import re
import time

time1 = time.time()
import docx
from docx import Document

result = []


class DocxReader():
    def __init__(self):
        '''''
        Constructor
        '''

    def parse(self, _path):
        fileStr = ""
        docment = Document(_path)
        for paragraph in docment.paragraphs:
            fileStr += paragraph.text
        return fileStr


if __name__ == '__main__':
    pdfReader = DocxReader()
    pdfReader.parse("./tempFile/附件关于印发大型工程技术风险控制要点的通知.docx")
